Refactor the RegistrySource implementation

author Alex Crichton <alex@alexcrichton.com>

Fri, 5 Feb 2016 23:11:07 +0000 (15:11 -0800)

committer Alex Crichton <alex@alexcrichton.com>

Mon, 1 Aug 2016 17:14:52 +0000 (10:14 -0700)
author Alex Crichton <alex@alexcrichton.com>
Fri, 5 Feb 2016 23:11:07 +0000 (15:11 -0800)
committer Alex Crichton <alex@alexcrichton.com>
Mon, 1 Aug 2016 17:14:52 +0000 (10:14 -0700)
diff --git a/src/bin/login.rs b/src/bin/login.rs

index a732c65faa4615f54752ed32b983647ab538f8d2..53de98af66e8572fa4b53e3a38049efe4389f6ff 100644 (file)
--- a/src/bin/login.rs
+++ b/src/bin/login.rs
@@ -44,9 +44,9 @@ pub fn execute(options: Options, config: &Config) -> CliResult<Option<()>> {
          Some(token) => token,
          None => {
              let src = try!(SourceId::crates_io(config));
-            let mut src = RegistrySource::new(&src, config);
+            let mut src = RegistrySource::remote(&src, config);
              try!(src.update());
-            let config = try!(src.config());
+            let config = try!(src.config()).unwrap();
              let host = options.flag_host.clone().unwrap_or(config.api);
              println!("please visit {}me and paste the API Token below", host);
              let mut line = String::new();
diff --git a/src/cargo/core/source.rs b/src/cargo/core/source.rs

index 2b5dc1347b757454aeb59ae362fa8f30095a8bd8..b8b89f600d9207822e1df3c53b7a477c5005e6c9 100644 (file)
--- a/src/cargo/core/source.rs
+++ b/src/cargo/core/source.rs
@@ -235,7 +235,7 @@ impl SourceId {
                  };
                  Box::new(PathSource::new(&path, self, config))
              }
-            Kind::Registry => Box::new(RegistrySource::new(self, config)),
+            Kind::Registry => Box::new(RegistrySource::remote(self, config)),
          }
      }
  
diff --git a/src/cargo/ops/registry.rs b/src/cargo/ops/registry.rs

index 20ad7fcd9be799a67678ecc080113a65ba395b4d..5866242fdab310a1d798d3d7b452eedb4e3217fd 100644 (file)
--- a/src/cargo/ops/registry.rs
+++ b/src/cargo/ops/registry.rs
@@ -171,11 +171,11 @@ pub fn registry(config: &Config,
          None => try!(SourceId::crates_io(config)),
      };
      let api_host = {
-        let mut src = RegistrySource::new(&sid, config);
+        let mut src = RegistrySource::remote(&sid, config);
          try!(src.update().chain_error(|| {
              human(format!("failed to update {}", sid))
          }));
-        (try!(src.config())).api
+        (try!(src.config())).unwrap().api
      };
      let handle = try!(http_handle(config));
      Ok((Registry::new_handle(api_host, token, handle), sid))
diff --git a/src/cargo/sources/registry.rs b/src/cargo/sources/registry.rs

deleted file mode 100644 (file)

index 287135c..0000000
--- a/src/cargo/sources/registry.rs
+++ /dev/null
@@ -1,586 +0,0 @@
-//! A `Source` for registry-based packages.
-//!
-//! # What's a Registry?
-//!
-//! Registries are central locations where packages can be uploaded to,
-//! discovered, and searched for. The purpose of a registry is to have a
-//! location that serves as permanent storage for versions of a crate over time.
-//!
-//! Compared to git sources, a registry provides many packages as well as many
-//! versions simultaneously. Git sources can also have commits deleted through
-//! rebasings where registries cannot have their versions deleted.
-//!
-//! # The Index of a Registry
-//!
-//! One of the major difficulties with a registry is that hosting so many
-//! packages may quickly run into performance problems when dealing with
-//! dependency graphs. It's infeasible for cargo to download the entire contents
-//! of the registry just to resolve one package's dependencies, for example. As
-//! a result, cargo needs some efficient method of querying what packages are
-//! available on a registry, what versions are available, and what the
-//! dependencies for each version is.
-//!
-//! One method of doing so would be having the registry expose an HTTP endpoint
-//! which can be queried with a list of packages and a response of their
-//! dependencies and versions is returned. This is somewhat inefficient however
-//! as we may have to hit the endpoint many times and we may have already
-//! queried for much of the data locally already (for other packages, for
-//! example). This also involves inventing a transport format between the
-//! registry and Cargo itself, so this route was not taken.
-//!
-//! Instead, Cargo communicates with registries through a git repository
-//! referred to as the Index. The Index of a registry is essentially an easily
-//! query-able version of the registry's database for a list of versions of a
-//! package as well as a list of dependencies for each version.
-//!
-//! Using git to host this index provides a number of benefits:
-//!
-//! * The entire index can be stored efficiently locally on disk. This means
-//!   that all queries of a registry can happen locally and don't need to touch
-//!   the network.
-//!
-//! * Updates of the index are quite efficient. Using git buys incremental
-//!   updates, compressed transmission, etc for free. The index must be updated
-//!   each time we need fresh information from a registry, but this is one
-//!   update of a git repository that probably hasn't changed a whole lot so
-//!   it shouldn't be too expensive.
-//!
-//!   Additionally, each modification to the index is just appending a line at
-//!   the end of a file (the exact format is described later). This means that
-//!   the commits for an index are quite small and easily applied/compressable.
-//!
-//! ## The format of the Index
-//!
-//! The index is a store for the list of versions for all packages known, so its
-//! format on disk is optimized slightly to ensure that `ls registry` doesn't
-//! produce a list of all packages ever known. The index also wants to ensure
-//! that there's not a million files which may actually end up hitting
-//! filesystem limits at some point. To this end, a few decisions were made
-//! about the format of the registry:
-//!
-//! 1. Each crate will have one file corresponding to it. Each version for a
-//!    crate will just be a line in this file.
-//! 2. There will be two tiers of directories for crate names, under which
-//!    crates corresponding to those tiers will be located.
-//!
-//! As an example, this is an example hierarchy of an index:
-//!
-//! ```notrust
-//! .
-//! ├── 3
-//! │   └── u
-//! │       └── url
-//! ├── bz
-//! │   └── ip
-//! │       └── bzip2
-//! ├── config.json
-//! ├── en
-//! │   └── co
-//! │       └── encoding
-//! └── li
-//!     ├── bg
-//!     │   └── libgit2
-//!     └── nk
-//!         └── link-config
-//! ```
-//!
-//! The root of the index contains a `config.json` file with a few entries
-//! corresponding to the registry (see `RegistryConfig` below).
-//!
-//! Otherwise, there are three numbered directories (1, 2, 3) for crates with
-//! names 1, 2, and 3 characters in length. The 1/2 directories simply have the
-//! crate files underneath them, while the 3 directory is sharded by the first
-//! letter of the crate name.
-//!
-//! Otherwise the top-level directory contains many two-letter directory names,
-//! each of which has many sub-folders with two letters. At the end of all these
-//! are the actual crate files themselves.
-//!
-//! The purpose of this layout is to hopefully cut down on `ls` sizes as well as
-//! efficient lookup based on the crate name itself.
-//!
-//! ## Crate files
-//!
-//! Each file in the index is the history of one crate over time. Each line in
-//! the file corresponds to one version of a crate, stored in JSON format (see
-//! the `RegistryPackage` structure below).
-//!
-//! As new versions are published, new lines are appended to this file. The only
-//! modifications to this file that should happen over time are yanks of a
-//! particular version.
-//!
-//! # Downloading Packages
-//!
-//! The purpose of the Index was to provide an efficient method to resolve the
-//! dependency graph for a package. So far we only required one network
-//! interaction to update the registry's repository (yay!). After resolution has
-//! been performed, however we need to download the contents of packages so we
-//! can read the full manifest and build the source code.
-//!
-//! To accomplish this, this source's `download` method will make an HTTP
-//! request per-package requested to download tarballs into a local cache. These
-//! tarballs will then be unpacked into a destination folder.
-//!
-//! Note that because versions uploaded to the registry are frozen forever that
-//! the HTTP download and unpacking can all be skipped if the version has
-//! already been downloaded and unpacked. This caching allows us to only
-//! download a package when absolutely necessary.
-//!
-//! # Filesystem Hierarchy
-//!
-//! Overall, the `$HOME/.cargo` looks like this when talking about the registry:
-//!
-//! ```notrust
-//! # A folder under which all registry metadata is hosted (similar to
-//! # $HOME/.cargo/git)
-//! $HOME/.cargo/registry/
-//!
-//!     # For each registry that cargo knows about (keyed by hostname + hash)
-//!     # there is a folder which is the checked out version of the index for
-//!     # the registry in this location. Note that this is done so cargo can
-//!     # support multiple registries simultaneously
-//!     index/
-//!         registry1-<hash>/
-//!         registry2-<hash>/
-//!         ...
-//!
-//!     # This folder is a cache for all downloaded tarballs from a registry.
-//!     # Once downloaded and verified, a tarball never changes.
-//!     cache/
-//!         registry1-<hash>/<pkg>-<version>.crate
-//!         ...
-//!
-//!     # Location in which all tarballs are unpacked. Each tarball is known to
-//!     # be frozen after downloading, so transitively this folder is also
-//!     # frozen once its unpacked (it's never unpacked again)
-//!     src/
-//!         registry1-<hash>/<pkg>-<version>/...
-//!         ...
-//! ```
-
-use std::collections::HashMap;
-use std::fs::File;
-use std::io::SeekFrom;
-use std::io::prelude::*;
-use std::path::{PathBuf, Path};
-
-use curl::easy::Easy;
-use flate2::read::GzDecoder;
-use git2;
-use rustc_serialize::hex::ToHex;
-use rustc_serialize::json;
-use tar::Archive;
-use url::Url;
-
-use core::{Source, SourceId, PackageId, Package, Summary, Registry};
-use core::dependency::{Dependency, DependencyInner, Kind};
-use sources::{PathSource, git};
-use util::{CargoResult, Config, internal, ChainError, ToUrl, human};
-use util::{hex, Sha256, paths, Filesystem, FileLock};
-use util::network;
-use ops;
-
-const INDEX_LOCK: &'static str = ".cargo-index-lock";
-pub static CRATES_IO: &'static str = "https://github.com/rust-lang/crates.io-index";
-
-pub struct RegistrySource<'cfg> {
-    source_id: SourceId,
-    checkout_path: Filesystem,
-    cache_path: Filesystem,
-    src_path: Filesystem,
-    config: &'cfg Config,
-    handle: Option<Easy>,
-    hashes: HashMap<(String, String), String>, // (name, vers) => cksum
-    cache: HashMap<String, Vec<(Summary, bool)>>,
-    updated: bool,
-}
-
-#[derive(RustcDecodable)]
-pub struct RegistryConfig {
-    /// Download endpoint for all crates. This will be appended with
-    /// `/<crate>/<version>/download` and then will be hit with an HTTP GET
-    /// request to download the tarball for a crate.
-    pub dl: String,
-
-    /// API endpoint for the registry. This is what's actually hit to perform
-    /// operations like yanks, owner modifications, publish new crates, etc.
-    pub api: String,
-}
-
-#[derive(RustcDecodable)]
-struct RegistryPackage {
-    name: String,
-    vers: String,
-    deps: Vec<RegistryDependency>,
-    features: HashMap<String, Vec<String>>,
-    cksum: String,
-    yanked: Option<bool>,
-}
-
-#[derive(RustcDecodable)]
-struct RegistryDependency {
-    name: String,
-    req: String,
-    features: Vec<String>,
-    optional: bool,
-    default_features: bool,
-    target: Option<String>,
-    kind: Option<String>,
-}
-
-impl<'cfg> RegistrySource<'cfg> {
-    pub fn new(source_id: &SourceId,
-               config: &'cfg Config) -> RegistrySource<'cfg> {
-        let hash = hex::short_hash(source_id);
-        let ident = source_id.url().host_str().unwrap_or("").to_string();
-        let part = format!("{}-{}", ident, hash);
-        RegistrySource {
-            checkout_path: config.registry_index_path().join(&part),
-            cache_path: config.registry_cache_path().join(&part),
-            src_path: config.registry_source_path().join(&part),
-            config: config,
-            source_id: source_id.clone(),
-            handle: None,
-            hashes: HashMap::new(),
-            cache: HashMap::new(),
-            updated: false,
-        }
-    }
-
-    /// Decode the configuration stored within the registry.
-    ///
-    /// This requires that the index has been at least checked out.
-    pub fn config(&self) -> CargoResult<RegistryConfig> {
-        let lock = try!(self.checkout_path.open_ro(Path::new(INDEX_LOCK),
-                                                   self.config,
-                                                   "the registry index"));
-        let path = lock.path().parent().unwrap();
-        let contents = try!(paths::read(&path.join("config.json")));
-        let config = try!(json::decode(&contents));
-        Ok(config)
-    }
-
-    /// Download the given package from the given url into the local cache.
-    ///
-    /// This will perform the HTTP request to fetch the package. This function
-    /// will only succeed if the HTTP download was successful and the file is
-    /// then ready for inspection.
-    ///
-    /// No action is taken if the package is already downloaded.
-    fn download_package(&mut self, pkg: &PackageId, url: &Url)
-                        -> CargoResult<FileLock> {
-        let filename = format!("{}-{}.crate", pkg.name(), pkg.version());
-        let path = Path::new(&filename);
-        let mut dst = try!(self.cache_path.open_rw(path, self.config, &filename));
-        let meta = try!(dst.file().metadata());
-        if meta.len() > 0 {
-            return Ok(dst)
-        }
-        try!(self.config.shell().status("Downloading", pkg));
-
-        let expected_hash = try!(self.hash(pkg));
-        let handle = match self.handle {
-            Some(ref mut handle) => handle,
-            None => {
-                self.handle = Some(try!(ops::http_handle(self.config)));
-                self.handle.as_mut().unwrap()
-            }
-        };
-        // TODO: don't download into memory, but ensure that if we ctrl-c a
-        //       download we should resume either from the start or the middle
-        //       on the next time
-        try!(handle.get(true));
-        try!(handle.url(&url.to_string()));
-        try!(handle.follow_location(true));
-        let mut state = Sha256::new();
-        let mut body = Vec::new();
-        {
-            let mut handle = handle.transfer();
-            try!(handle.write_function(|buf| {
-                state.update(buf);
-                body.extend_from_slice(buf);
-                Ok(buf.len())
-            }));
-            try!(network::with_retry(self.config, || {
-                handle.perform()
-            }))
-        }
-        let code = try!(handle.response_code());
-        if code != 200 && code != 0 {
-            bail!("failed to get 200 response from `{}`, got {}", url, code)
-        }
-
-        // Verify what we just downloaded
-        if state.finish().to_hex() != expected_hash {
-            bail!("failed to verify the checksum of `{}`", pkg)
-        }
-
-        try!(dst.write_all(&body));
-        try!(dst.seek(SeekFrom::Start(0)));
-        Ok(dst)
-    }
-
-    /// Return the hash listed for a specified PackageId.
-    fn hash(&mut self, pkg: &PackageId) -> CargoResult<String> {
-        let key = (pkg.name().to_string(), pkg.version().to_string());
-        if let Some(s) = self.hashes.get(&key) {
-            return Ok(s.clone())
-        }
-        // Ok, we're missing the key, so parse the index file to load it.
-        try!(self.summaries(pkg.name()));
-        self.hashes.get(&key).chain_error(|| {
-            internal(format!("no hash listed for {}", pkg))
-        }).map(|s| s.clone())
-    }
-
-    /// Unpacks a downloaded package into a location where it's ready to be
-    /// compiled.
-    ///
-    /// No action is taken if the source looks like it's already unpacked.
-    fn unpack_package(&self,
-                      pkg: &PackageId,
-                      tarball: &FileLock)
-                      -> CargoResult<PathBuf> {
-        let dst = self.src_path.join(&format!("{}-{}", pkg.name(),
-                                              pkg.version()));
-        try!(dst.create_dir());
-        // Note that we've already got the `tarball` locked above, and that
-        // implies a lock on the unpacked destination as well, so this access
-        // via `into_path_unlocked` should be ok.
-        let dst = dst.into_path_unlocked();
-        let ok = dst.join(".cargo-ok");
-        if ok.exists() {
-            return Ok(dst)
-        }
-
-        let gz = try!(GzDecoder::new(tarball.file()));
-        let mut tar = Archive::new(gz);
-        try!(tar.unpack(dst.parent().unwrap()));
-        try!(File::create(&ok));
-        Ok(dst)
-    }
-
-    /// Parse the on-disk metadata for the package provided
-    pub fn summaries(&mut self, name: &str) -> CargoResult<&Vec<(Summary, bool)>> {
-        if self.cache.contains_key(name) {
-            return Ok(self.cache.get(name).unwrap());
-        }
-        let lock = self.checkout_path.open_ro(Path::new(INDEX_LOCK),
-                                              self.config,
-                                              "the registry index");
-        let file = lock.and_then(|lock| {
-            let path = lock.path().parent().unwrap();
-            let fs_name = name.chars().flat_map(|c| {
-                c.to_lowercase()
-            }).collect::<String>();
-
-            // see module comment for why this is structured the way it is
-            let path = match fs_name.len() {
-                1 => path.join("1").join(&fs_name),
-                2 => path.join("2").join(&fs_name),
-                3 => path.join("3").join(&fs_name[..1]).join(&fs_name),
-                _ => path.join(&fs_name[0..2])
-                         .join(&fs_name[2..4])
-                         .join(&fs_name),
-            };
-            File::open(&path).map_err(human)
-        });
-        let summaries = match file {
-            Ok(mut f) => {
-                let mut contents = String::new();
-                try!(f.read_to_string(&mut contents));
-                let ret: CargoResult<Vec<(Summary, bool)>>;
-                ret = contents.lines().filter(|l| l.trim().len() > 0)
-                              .map(|l| self.parse_registry_package(l))
-                              .collect();
-                try!(ret.chain_error(|| {
-                    internal(format!("failed to parse registry's information \
-                                      for: {}", name))
-                }))
-            }
-            Err(..) => Vec::new(),
-        };
-        let summaries = summaries.into_iter().filter(|summary| {
-            summary.0.package_id().name() == name
-        }).collect();
-        self.cache.insert(name.to_string(), summaries);
-        Ok(self.cache.get(name).unwrap())
-    }
-
-    /// Parse a line from the registry's index file into a Summary for a
-    /// package.
-    ///
-    /// The returned boolean is whether or not the summary has been yanked.
-    fn parse_registry_package(&mut self, line: &str)
-                              -> CargoResult<(Summary, bool)> {
-        let RegistryPackage {
-            name, vers, cksum, deps, features, yanked
-        } = try!(json::decode::<RegistryPackage>(line));
-        let pkgid = try!(PackageId::new(&name, &vers, &self.source_id));
-        let deps: CargoResult<Vec<Dependency>> = deps.into_iter().map(|dep| {
-            self.parse_registry_dependency(dep)
-        }).collect();
-        let deps = try!(deps);
-        let summary = try!(Summary::new(pkgid, deps, features));
-        let summary = summary.set_checksum(cksum.clone());
-        self.hashes.insert((name, vers), cksum);
-        Ok((summary, yanked.unwrap_or(false)))
-    }
-
-    /// Converts an encoded dependency in the registry to a cargo dependency
-    fn parse_registry_dependency(&self, dep: RegistryDependency)
-                                 -> CargoResult<Dependency> {
-        let RegistryDependency {
-            name, req, features, optional, default_features, target, kind
-        } = dep;
-
-        let dep = try!(DependencyInner::parse(&name, Some(&req),
-                                              &self.source_id));
-        let kind = match kind.as_ref().map(|s| &s[..]).unwrap_or("") {
-            "dev" => Kind::Development,
-            "build" => Kind::Build,
-            _ => Kind::Normal,
-        };
-
-        let platform = match target {
-            Some(target) => Some(try!(target.parse())),
-            None => None,
-        };
-
-        // Unfortunately older versions of cargo and/or the registry ended up
-        // publishing lots of entries where the features array contained the
-        // empty feature, "", inside. This confuses the resolution process much
-        // later on and these features aren't actually valid, so filter them all
-        // out here.
-        let features = features.into_iter().filter(|s| !s.is_empty()).collect();
-
-        Ok(dep.set_optional(optional)
-              .set_default_features(default_features)
-              .set_features(features)
-              .set_platform(platform)
-              .set_kind(kind)
-              .into_dependency())
-    }
-
-    /// Actually perform network operations to update the registry
-    fn do_update(&mut self) -> CargoResult<()> {
-        if self.updated {
-            return Ok(())
-        }
-        try!(self.checkout_path.create_dir());
-        let lock = try!(self.checkout_path.open_rw(Path::new(INDEX_LOCK),
-                                                   self.config,
-                                                   "the registry index"));
-        let path = lock.path().parent().unwrap();
-
-        try!(self.config.shell().status("Updating",
-             format!("registry `{}`", self.source_id.url())));
-        let repo = try!(git2::Repository::open(path).or_else(|_| {
-            let _ = lock.remove_siblings();
-            git2::Repository::init(path)
-        }));
-
-        // git fetch origin
-        let url = self.source_id.url().to_string();
-        let refspec = "refs/heads/*:refs/remotes/origin/*";
-
-        try!(git::fetch(&repo, &url, refspec, &self.config).chain_error(|| {
-            human(format!("failed to fetch `{}`", url))
-        }));
-
-        // git reset --hard origin/master
-        let reference = "refs/remotes/origin/master";
-        let oid = try!(repo.refname_to_id(reference));
-        trace!("[{}] updating to rev {}", self.source_id, oid);
-        let object = try!(repo.find_object(oid, None));
-        try!(repo.reset(&object, git2::ResetType::Hard, None));
-        self.updated = true;
-        self.cache.clear();
-        Ok(())
-    }
-}
-
-impl<'cfg> Registry for RegistrySource<'cfg> {
-    fn query(&mut self, dep: &Dependency) -> CargoResult<Vec<Summary>> {
-        // If this is a precise dependency, then it came from a lockfile and in
-        // theory the registry is known to contain this version. If, however, we
-        // come back with no summaries, then our registry may need to be
-        // updated, so we fall back to performing a lazy update.
-        if dep.source_id().precise().is_some() {
-            let mut summaries = try!(self.summaries(dep.name())).iter().map(|s| {
-                s.0.clone()
-            }).collect::<Vec<_>>();
-            if try!(summaries.query(dep)).is_empty() {
-                try!(self.do_update());
-            }
-        }
-
-        let mut summaries = {
-            let summaries = try!(self.summaries(dep.name()));
-            summaries.iter().filter(|&&(_, yanked)| {
-                dep.source_id().precise().is_some() || !yanked
-            }).map(|s| s.0.clone()).collect::<Vec<_>>()
-        };
-
-        // Handle `cargo update --precise` here. If specified, our own source
-        // will have a precise version listed of the form `<pkg>=<req>` where
-        // `<pkg>` is the name of a crate on this source and `<req>` is the
-        // version requested (agument to `--precise`).
-        summaries.retain(|s| {
-            match self.source_id.precise() {
-                Some(p) if p.starts_with(dep.name()) &&
-                           p[dep.name().len()..].starts_with("=") => {
-                    let vers = &p[dep.name().len() + 1..];
-                    s.version().to_string() == vers
-                }
-                _ => true,
-            }
-        });
-        summaries.query(dep)
-    }
-
-    fn supports_checksums(&self) -> bool {
-        true
-    }
-}
-
-impl<'cfg> Source for RegistrySource<'cfg> {
-    fn update(&mut self) -> CargoResult<()> {
-        // If we have an imprecise version then we don't know what we're going
-        // to look for, so we always attempt to perform an update here.
-        //
-        // If we have a precise version, then we'll update lazily during the
-        // querying phase. Note that precise in this case is only
-        // `Some("locked")` as other `Some` values indicate a `cargo update
-        // --precise` request
-        if self.source_id.precise() != Some("locked") {
-            try!(self.do_update());
-        }
-        Ok(())
-    }
-
-    fn download(&mut self, package: &PackageId) -> CargoResult<Package> {
-        let config = try!(self.config());
-        let url = try!(config.dl.to_url().map_err(internal));
-        let mut url = url.clone();
-        url.path_segments_mut().unwrap()
-            .push(package.name())
-            .push(&package.version().to_string())
-            .push("download");
-        let krate = try!(self.download_package(package, &url).chain_error(|| {
-            internal(format!("failed to download package `{}` from {}",
-                             package, url))
-        }));
-        let path = try!(self.unpack_package(package, &krate).chain_error(|| {
-            internal(format!("failed to unpack package `{}`", package))
-        }));
-
-        let mut src = PathSource::new(&path, &self.source_id, self.config);
-        try!(src.update());
-        src.download(package)
-    }
-
-    fn fingerprint(&self, pkg: &Package) -> CargoResult<String> {
-        Ok(pkg.package_id().version().to_string())
-    }
-}
diff --git a/src/cargo/sources/registry/index.rs b/src/cargo/sources/registry/index.rs

new file mode 100644 (file)

index 0000000..7d06ee1
--- /dev/null
+++ b/src/cargo/sources/registry/index.rs
@@ -0,0 +1,182 @@
+use std::collections::HashMap;
+use std::io::prelude::*;
+use std::fs::File;
+use std::path::Path;
+
+use rustc_serialize::json;
+
+use core::dependency::{Dependency, DependencyInner, Kind};
+use core::{SourceId, Summary, PackageId, Registry};
+use sources::registry::{RegistryPackage, RegistryDependency, INDEX_LOCK};
+use util::{CargoResult, ChainError, internal, Filesystem, human, Config};
+
+pub struct RegistryIndex<'cfg> {
+    source_id: SourceId,
+    path: Filesystem,
+    cache: HashMap<String, Vec<(Summary, bool)>>,
+    hashes: HashMap<(String, String), String>, // (name, vers) => cksum
+    config: &'cfg Config,
+}
+
+impl<'cfg> RegistryIndex<'cfg> {
+    pub fn new(id: &SourceId,
+               path: &Filesystem,
+               config: &'cfg Config) -> RegistryIndex<'cfg> {
+        RegistryIndex {
+            source_id: id.clone(),
+            path: path.clone(),
+            cache: HashMap::new(),
+            hashes: HashMap::new(),
+            config: config,
+        }
+    }
+
+    /// Return the hash listed for a specified PackageId.
+    pub fn hash(&mut self, pkg: &PackageId) -> CargoResult<String> {
+        let key = (pkg.name().to_string(), pkg.version().to_string());
+        if let Some(s) = self.hashes.get(&key) {
+            return Ok(s.clone())
+        }
+        // Ok, we're missing the key, so parse the index file to load it.
+        try!(self.summaries(pkg.name()));
+        self.hashes.get(&key).chain_error(|| {
+            internal(format!("no hash listed for {}", pkg))
+        }).map(|s| s.clone())
+    }
+
+    /// Parse the on-disk metadata for the package provided
+    ///
+    /// Returns a list of pairs of (summary, yanked) for the package name
+    /// specified.
+    pub fn summaries(&mut self, name: &str) -> CargoResult<&Vec<(Summary, bool)>> {
+        if self.cache.contains_key(name) {
+            return Ok(self.cache.get(name).unwrap());
+        }
+        let lock = self.path.open_ro(Path::new(INDEX_LOCK),
+                                     self.config,
+                                     "the registry index");
+        let file = lock.and_then(|lock| {
+            let path = lock.path().parent().unwrap();
+            let fs_name = name.chars().flat_map(|c| {
+                c.to_lowercase()
+            }).collect::<String>();
+
+            // see module comment for why this is structured the way it is
+            let path = match fs_name.len() {
+                1 => path.join("1").join(&fs_name),
+                2 => path.join("2").join(&fs_name),
+                3 => path.join("3").join(&fs_name[..1]).join(&fs_name),
+                _ => path.join(&fs_name[0..2])
+                         .join(&fs_name[2..4])
+                         .join(&fs_name),
+            };
+            File::open(&path).map_err(human)
+        });
+        let summaries = match file {
+            Ok(mut f) => {
+                let mut contents = String::new();
+                try!(f.read_to_string(&mut contents));
+                let ret: CargoResult<Vec<(Summary, bool)>>;
+                ret = contents.lines().filter(|l| l.trim().len() > 0)
+                              .map(|l| self.parse_registry_package(l))
+                              .collect();
+                try!(ret.chain_error(|| {
+                    internal(format!("failed to parse registry's information \
+                                      for: {}", name))
+                }))
+            }
+            Err(..) => Vec::new(),
+        };
+        let summaries = summaries.into_iter().filter(|summary| {
+            summary.0.package_id().name() == name
+        }).collect();
+        self.cache.insert(name.to_string(), summaries);
+        Ok(self.cache.get(name).unwrap())
+    }
+
+    /// Parse a line from the registry's index file into a Summary for a
+    /// package.
+    ///
+    /// The returned boolean is whether or not the summary has been yanked.
+    fn parse_registry_package(&mut self, line: &str)
+                              -> CargoResult<(Summary, bool)> {
+        let RegistryPackage {
+            name, vers, cksum, deps, features, yanked
+        } = try!(json::decode::<RegistryPackage>(line));
+        let pkgid = try!(PackageId::new(&name, &vers, &self.source_id));
+        let deps: CargoResult<Vec<Dependency>> = deps.into_iter().map(|dep| {
+            self.parse_registry_dependency(dep)
+        }).collect();
+        let deps = try!(deps);
+        let summary = try!(Summary::new(pkgid, deps, features));
+        let summary = summary.set_checksum(cksum.clone());
+        self.hashes.insert((name, vers), cksum);
+        Ok((summary, yanked.unwrap_or(false)))
+    }
+
+    /// Converts an encoded dependency in the registry to a cargo dependency
+    fn parse_registry_dependency(&self, dep: RegistryDependency)
+                                 -> CargoResult<Dependency> {
+        let RegistryDependency {
+            name, req, features, optional, default_features, target, kind
+        } = dep;
+
+        let dep = try!(DependencyInner::parse(&name, Some(&req),
+                                              &self.source_id));
+        let kind = match kind.as_ref().map(|s| &s[..]).unwrap_or("") {
+            "dev" => Kind::Development,
+            "build" => Kind::Build,
+            _ => Kind::Normal,
+        };
+
+        let platform = match target {
+            Some(target) => Some(try!(target.parse())),
+            None => None,
+        };
+
+        // Unfortunately older versions of cargo and/or the registry ended up
+        // publishing lots of entries where the features array contained the
+        // empty feature, "", inside. This confuses the resolution process much
+        // later on and these features aren't actually valid, so filter them all
+        // out here.
+        let features = features.into_iter().filter(|s| !s.is_empty()).collect();
+
+        Ok(dep.set_optional(optional)
+              .set_default_features(default_features)
+              .set_features(features)
+              .set_platform(platform)
+              .set_kind(kind)
+              .into_dependency())
+    }
+}
+
+impl<'cfg> Registry for RegistryIndex<'cfg> {
+    fn query(&mut self, dep: &Dependency) -> CargoResult<Vec<Summary>> {
+        let mut summaries = {
+            let summaries = try!(self.summaries(dep.name()));
+            summaries.iter().filter(|&&(_, yanked)| {
+                dep.source_id().precise().is_some() || !yanked
+            }).map(|s| s.0.clone()).collect::<Vec<_>>()
+        };
+
+        // Handle `cargo update --precise` here. If specified, our own source
+        // will have a precise version listed of the form `<pkg>=<req>` where
+        // `<pkg>` is the name of a crate on this source and `<req>` is the
+        // version requested (agument to `--precise`).
+        summaries.retain(|s| {
+            match self.source_id.precise() {
+                Some(p) if p.starts_with(dep.name()) &&
+                           p[dep.name().len()..].starts_with("=") => {
+                    let vers = &p[dep.name().len() + 1..];
+                    s.version().to_string() == vers
+                }
+                _ => true,
+            }
+        });
+        summaries.query(dep)
+    }
+
+    fn supports_checksums(&self) -> bool {
+        true
+    }
+}
diff --git a/src/cargo/sources/registry/mod.rs b/src/cargo/sources/registry/mod.rs

new file mode 100644 (file)

index 0000000..4b280c0
--- /dev/null
+++ b/src/cargo/sources/registry/mod.rs
@@ -0,0 +1,354 @@
+//! A `Source` for registry-based packages.
+//!
+//! # What's a Registry?
+//!
+//! Registries are central locations where packages can be uploaded to,
+//! discovered, and searched for. The purpose of a registry is to have a
+//! location that serves as permanent storage for versions of a crate over time.
+//!
+//! Compared to git sources, a registry provides many packages as well as many
+//! versions simultaneously. Git sources can also have commits deleted through
+//! rebasings where registries cannot have their versions deleted.
+//!
+//! # The Index of a Registry
+//!
+//! One of the major difficulties with a registry is that hosting so many
+//! packages may quickly run into performance problems when dealing with
+//! dependency graphs. It's infeasible for cargo to download the entire contents
+//! of the registry just to resolve one package's dependencies, for example. As
+//! a result, cargo needs some efficient method of querying what packages are
+//! available on a registry, what versions are available, and what the
+//! dependencies for each version is.
+//!
+//! One method of doing so would be having the registry expose an HTTP endpoint
+//! which can be queried with a list of packages and a response of their
+//! dependencies and versions is returned. This is somewhat inefficient however
+//! as we may have to hit the endpoint many times and we may have already
+//! queried for much of the data locally already (for other packages, for
+//! example). This also involves inventing a transport format between the
+//! registry and Cargo itself, so this route was not taken.
+//!
+//! Instead, Cargo communicates with registries through a git repository
+//! referred to as the Index. The Index of a registry is essentially an easily
+//! query-able version of the registry's database for a list of versions of a
+//! package as well as a list of dependencies for each version.
+//!
+//! Using git to host this index provides a number of benefits:
+//!
+//! * The entire index can be stored efficiently locally on disk. This means
+//!   that all queries of a registry can happen locally and don't need to touch
+//!   the network.
+//!
+//! * Updates of the index are quite efficient. Using git buys incremental
+//!   updates, compressed transmission, etc for free. The index must be updated
+//!   each time we need fresh information from a registry, but this is one
+//!   update of a git repository that probably hasn't changed a whole lot so
+//!   it shouldn't be too expensive.
+//!
+//!   Additionally, each modification to the index is just appending a line at
+//!   the end of a file (the exact format is described later). This means that
+//!   the commits for an index are quite small and easily applied/compressable.
+//!
+//! ## The format of the Index
+//!
+//! The index is a store for the list of versions for all packages known, so its
+//! format on disk is optimized slightly to ensure that `ls registry` doesn't
+//! produce a list of all packages ever known. The index also wants to ensure
+//! that there's not a million files which may actually end up hitting
+//! filesystem limits at some point. To this end, a few decisions were made
+//! about the format of the registry:
+//!
+//! 1. Each crate will have one file corresponding to it. Each version for a
+//!    crate will just be a line in this file.
+//! 2. There will be two tiers of directories for crate names, under which
+//!    crates corresponding to those tiers will be located.
+//!
+//! As an example, this is an example hierarchy of an index:
+//!
+//! ```notrust
+//! .
+//! ├── 3
+//! │   └── u
+//! │       └── url
+//! ├── bz
+//! │   └── ip
+//! │       └── bzip2
+//! ├── config.json
+//! ├── en
+//! │   └── co
+//! │       └── encoding
+//! └── li
+//!     ├── bg
+//!     │   └── libgit2
+//!     └── nk
+//!         └── link-config
+//! ```
+//!
+//! The root of the index contains a `config.json` file with a few entries
+//! corresponding to the registry (see `RegistryConfig` below).
+//!
+//! Otherwise, there are three numbered directories (1, 2, 3) for crates with
+//! names 1, 2, and 3 characters in length. The 1/2 directories simply have the
+//! crate files underneath them, while the 3 directory is sharded by the first
+//! letter of the crate name.
+//!
+//! Otherwise the top-level directory contains many two-letter directory names,
+//! each of which has many sub-folders with two letters. At the end of all these
+//! are the actual crate files themselves.
+//!
+//! The purpose of this layout is to hopefully cut down on `ls` sizes as well as
+//! efficient lookup based on the crate name itself.
+//!
+//! ## Crate files
+//!
+//! Each file in the index is the history of one crate over time. Each line in
+//! the file corresponds to one version of a crate, stored in JSON format (see
+//! the `RegistryPackage` structure below).
+//!
+//! As new versions are published, new lines are appended to this file. The only
+//! modifications to this file that should happen over time are yanks of a
+//! particular version.
+//!
+//! # Downloading Packages
+//!
+//! The purpose of the Index was to provide an efficient method to resolve the
+//! dependency graph for a package. So far we only required one network
+//! interaction to update the registry's repository (yay!). After resolution has
+//! been performed, however we need to download the contents of packages so we
+//! can read the full manifest and build the source code.
+//!
+//! To accomplish this, this source's `download` method will make an HTTP
+//! request per-package requested to download tarballs into a local cache. These
+//! tarballs will then be unpacked into a destination folder.
+//!
+//! Note that because versions uploaded to the registry are frozen forever that
+//! the HTTP download and unpacking can all be skipped if the version has
+//! already been downloaded and unpacked. This caching allows us to only
+//! download a package when absolutely necessary.
+//!
+//! # Filesystem Hierarchy
+//!
+//! Overall, the `$HOME/.cargo` looks like this when talking about the registry:
+//!
+//! ```notrust
+//! # A folder under which all registry metadata is hosted (similar to
+//! # $HOME/.cargo/git)
+//! $HOME/.cargo/registry/
+//!
+//!     # For each registry that cargo knows about (keyed by hostname + hash)
+//!     # there is a folder which is the checked out version of the index for
+//!     # the registry in this location. Note that this is done so cargo can
+//!     # support multiple registries simultaneously
+//!     index/
+//!         registry1-<hash>/
+//!         registry2-<hash>/
+//!         ...
+//!
+//!     # This folder is a cache for all downloaded tarballs from a registry.
+//!     # Once downloaded and verified, a tarball never changes.
+//!     cache/
+//!         registry1-<hash>/<pkg>-<version>.crate
+//!         ...
+//!
+//!     # Location in which all tarballs are unpacked. Each tarball is known to
+//!     # be frozen after downloading, so transitively this folder is also
+//!     # frozen once its unpacked (it's never unpacked again)
+//!     src/
+//!         registry1-<hash>/<pkg>-<version>/...
+//!         ...
+//! ```
+
+use std::collections::HashMap;
+use std::fs::File;
+use std::path::PathBuf;
+
+use flate2::read::GzDecoder;
+use tar::Archive;
+
+use core::{Source, SourceId, PackageId, Package, Summary, Registry};
+use core::dependency::Dependency;
+use sources::PathSource;
+use util::{CargoResult, Config, internal, ChainError, FileLock, Filesystem};
+use util::hex;
+
+const INDEX_LOCK: &'static str = ".cargo-index-lock";
+pub static CRATES_IO: &'static str = "https://github.com/rust-lang/crates.io-index";
+
+pub struct RegistrySource<'cfg> {
+    source_id: SourceId,
+    src_path: Filesystem,
+    config: &'cfg Config,
+    updated: bool,
+    ops: Box<RegistryData + 'cfg>,
+    index: index::RegistryIndex<'cfg>,
+}
+
+#[derive(RustcDecodable)]
+pub struct RegistryConfig {
+    /// Download endpoint for all crates. This will be appended with
+    /// `/<crate>/<version>/download` and then will be hit with an HTTP GET
+    /// request to download the tarball for a crate.
+    pub dl: String,
+
+    /// API endpoint for the registry. This is what's actually hit to perform
+    /// operations like yanks, owner modifications, publish new crates, etc.
+    pub api: String,
+}
+
+#[derive(RustcDecodable)]
+struct RegistryPackage {
+    name: String,
+    vers: String,
+    deps: Vec<RegistryDependency>,
+    features: HashMap<String, Vec<String>>,
+    cksum: String,
+    yanked: Option<bool>,
+}
+
+#[derive(RustcDecodable)]
+struct RegistryDependency {
+    name: String,
+    req: String,
+    features: Vec<String>,
+    optional: bool,
+    default_features: bool,
+    target: Option<String>,
+    kind: Option<String>,
+}
+
+pub trait RegistryData {
+    fn index_path(&self) -> &Filesystem;
+    fn config(&self) -> CargoResult<Option<RegistryConfig>>;
+    fn update_index(&mut self) -> CargoResult<()>;
+    fn download(&mut self,
+                pkg: &PackageId,
+                checksum: &str) -> CargoResult<FileLock>;
+}
+
+mod index;
+mod remote;
+
+fn short_name(id: &SourceId) -> String {
+    let hash = hex::short_hash(id);
+    let ident = id.url().host_str().unwrap_or("").to_string();
+    format!("{}-{}", ident, hash)
+}
+
+impl<'cfg> RegistrySource<'cfg> {
+    pub fn remote(source_id: &SourceId,
+                  config: &'cfg Config) -> RegistrySource<'cfg> {
+        let name = short_name(source_id);
+        let ops = remote::RemoteRegistry::new(source_id, config, &name);
+        RegistrySource::new(source_id, config, &name, Box::new(ops))
+    }
+
+    fn new(source_id: &SourceId,
+           config: &'cfg Config,
+           name: &str,
+           ops: Box<RegistryData + 'cfg>) -> RegistrySource<'cfg> {
+        RegistrySource {
+            src_path: config.registry_source_path().join(name),
+            config: config,
+            source_id: source_id.clone(),
+            updated: false,
+            index: index::RegistryIndex::new(source_id,
+                                             ops.index_path(),
+                                             config),
+            ops: ops,
+        }
+    }
+
+    /// Decode the configuration stored within the registry.
+    ///
+    /// This requires that the index has been at least checked out.
+    pub fn config(&self) -> CargoResult<Option<RegistryConfig>> {
+        self.ops.config()
+    }
+
+    /// Unpacks a downloaded package into a location where it's ready to be
+    /// compiled.
+    ///
+    /// No action is taken if the source looks like it's already unpacked.
+    fn unpack_package(&self,
+                      pkg: &PackageId,
+                      tarball: &FileLock)
+                      -> CargoResult<PathBuf> {
+        let dst = self.src_path.join(&format!("{}-{}", pkg.name(),
+                                              pkg.version()));
+        try!(dst.create_dir());
+        // Note that we've already got the `tarball` locked above, and that
+        // implies a lock on the unpacked destination as well, so this access
+        // via `into_path_unlocked` should be ok.
+        let dst = dst.into_path_unlocked();
+        let ok = dst.join(".cargo-ok");
+        if ok.exists() {
+            return Ok(dst)
+        }
+
+        let gz = try!(GzDecoder::new(tarball.file()));
+        let mut tar = Archive::new(gz);
+        try!(tar.unpack(dst.parent().unwrap()));
+        try!(File::create(&ok));
+        Ok(dst)
+    }
+
+    fn do_update(&mut self) -> CargoResult<()> {
+        try!(self.ops.update_index());
+        let path = self.ops.index_path();
+        self.index = index::RegistryIndex::new(&self.source_id,
+                                               path,
+                                               self.config);
+        Ok(())
+    }
+}
+
+impl<'cfg> Registry for RegistrySource<'cfg> {
+    fn query(&mut self, dep: &Dependency) -> CargoResult<Vec<Summary>> {
+        // If this is a precise dependency, then it came from a lockfile and in
+        // theory the registry is known to contain this version. If, however, we
+        // come back with no summaries, then our registry may need to be
+        // updated, so we fall back to performing a lazy update.
+        if dep.source_id().precise().is_some() && !self.updated {
+            if try!(self.index.query(dep)).is_empty() {
+                try!(self.do_update());
+            }
+        }
+
+        self.index.query(dep)
+    }
+
+    fn supports_checksums(&self) -> bool {
+        true
+    }
+}
+
+impl<'cfg> Source for RegistrySource<'cfg> {
+    fn update(&mut self) -> CargoResult<()> {
+        // If we have an imprecise version then we don't know what we're going
+        // to look for, so we always attempt to perform an update here.
+        //
+        // If we have a precise version, then we'll update lazily during the
+        // querying phase. Note that precise in this case is only
+        // `Some("locked")` as other `Some` values indicate a `cargo update
+        // --precise` request
+        if self.source_id.precise() != Some("locked") {
+            try!(self.do_update());
+        }
+        Ok(())
+    }
+
+    fn download(&mut self, package: &PackageId) -> CargoResult<Package> {
+        let hash = try!(self.index.hash(package));
+        let path = try!(self.ops.download(package, &hash));
+        let path = try!(self.unpack_package(package, &path).chain_error(|| {
+            internal(format!("failed to unpack package `{}`", package))
+        }));
+        let mut src = PathSource::new(&path, &self.source_id, self.config);
+        try!(src.update());
+        src.download(package)
+    }
+
+    fn fingerprint(&self, pkg: &Package) -> CargoResult<String> {
+        Ok(pkg.package_id().version().to_string())
+    }
+}
diff --git a/src/cargo/sources/registry/remote.rs b/src/cargo/sources/registry/remote.rs

new file mode 100644 (file)

index 0000000..28d6ada
--- /dev/null
+++ b/src/cargo/sources/registry/remote.rs
@@ -0,0 +1,144 @@
+use std::io::SeekFrom;
+use std::io::prelude::*;
+use std::path::Path;
+
+use curl::easy::Easy;
+use git2;
+use rustc_serialize::json;
+use rustc_serialize::hex::ToHex;
+
+use core::{PackageId, SourceId};
+use ops;
+use sources::git;
+use sources::registry::{RegistryData, RegistryConfig, INDEX_LOCK};
+use util::network;
+use util::paths;
+use util::{FileLock, Filesystem};
+use util::{Config, CargoResult, ChainError, human, Sha256, ToUrl};
+
+pub struct RemoteRegistry<'cfg> {
+    index_path: Filesystem,
+    cache_path: Filesystem,
+    source_id: SourceId,
+    config: &'cfg Config,
+    handle: Option<Easy>,
+}
+
+impl<'cfg> RemoteRegistry<'cfg> {
+    pub fn new(source_id: &SourceId, config: &'cfg Config, name: &str)
+               -> RemoteRegistry<'cfg> {
+        RemoteRegistry {
+            index_path: config.registry_index_path().join(name),
+            cache_path: config.registry_cache_path().join(name),
+            source_id: source_id.clone(),
+            config: config,
+            handle: None,
+        }
+    }
+}
+
+impl<'cfg> RegistryData for RemoteRegistry<'cfg> {
+    fn index_path(&self) -> &Filesystem {
+        &self.index_path
+    }
+
+    fn config(&self) -> CargoResult<Option<RegistryConfig>> {
+        let lock = try!(self.index_path.open_ro(Path::new(INDEX_LOCK),
+                                                self.config,
+                                                "the registry index"));
+        let path = lock.path().parent().unwrap();
+        let contents = try!(paths::read(&path.join("config.json")));
+        let config = try!(json::decode(&contents));
+        Ok(Some(config))
+    }
+
+    fn update_index(&mut self) -> CargoResult<()> {
+        try!(self.index_path.create_dir());
+        let lock = try!(self.index_path.open_rw(Path::new(INDEX_LOCK),
+                                                self.config,
+                                                "the registry index"));
+        let path = lock.path().parent().unwrap();
+
+        try!(self.config.shell().status("Updating",
+             format!("registry `{}`", self.source_id.url())));
+        let repo = try!(git2::Repository::open(path).or_else(|_| {
+            let _ = lock.remove_siblings();
+            git2::Repository::init(path)
+        }));
+
+        // git fetch origin
+        let url = self.source_id.url().to_string();
+        let refspec = "refs/heads/*:refs/remotes/origin/*";
+
+        try!(git::fetch(&repo, &url, refspec, &self.config).chain_error(|| {
+            human(format!("failed to fetch `{}`", url))
+        }));
+
+        // git reset --hard origin/master
+        let reference = "refs/remotes/origin/master";
+        let oid = try!(repo.refname_to_id(reference));
+        trace!("[{}] updating to rev {}", self.source_id, oid);
+        let object = try!(repo.find_object(oid, None));
+        try!(repo.reset(&object, git2::ResetType::Hard, None));
+        Ok(())
+    }
+
+    fn download(&mut self, pkg: &PackageId, checksum: &str)
+                -> CargoResult<FileLock> {
+        let filename = format!("{}-{}.crate", pkg.name(), pkg.version());
+        let path = Path::new(&filename);
+        let mut dst = try!(self.cache_path.open_rw(path, self.config, &filename));
+        let meta = try!(dst.file().metadata());
+        if meta.len() > 0 {
+            return Ok(dst)
+        }
+        try!(self.config.shell().status("Downloading", pkg));
+
+        let config = try!(self.config()).unwrap();
+        let mut url = try!(config.dl.to_url());
+        url.path_segments_mut().unwrap()
+            .push(pkg.name())
+            .push(&pkg.version().to_string())
+            .push("download");
+
+        let handle = match self.handle {
+            Some(ref mut handle) => handle,
+            None => {
+                self.handle = Some(try!(ops::http_handle(self.config)));
+                self.handle.as_mut().unwrap()
+            }
+        };
+        // TODO: don't download into memory, but ensure that if we ctrl-c a
+        //       download we should resume either from the start or the middle
+        //       on the next time
+        try!(handle.get(true));
+        try!(handle.url(&url.to_string()));
+        try!(handle.follow_location(true));
+        let mut state = Sha256::new();
+        let mut body = Vec::new();
+        {
+            let mut handle = handle.transfer();
+            try!(handle.write_function(|buf| {
+                state.update(buf);
+                body.extend_from_slice(buf);
+                Ok(buf.len())
+            }));
+            try!(network::with_retry(self.config, || {
+                handle.perform()
+            }))
+        }
+        let code = try!(handle.response_code());
+        if code != 200 && code != 0 {
+            bail!("failed to get 200 response from `{}`, got {}", url, code)
+        }
+
+        // Verify what we just downloaded
+        if state.finish().to_hex() != checksum {
+            bail!("failed to verify the checksum of `{}`", pkg)
+        }
+
+        try!(dst.write_all(&body));
+        try!(dst.seek(SeekFrom::Start(0)));
+        Ok(dst)
+    }
+}
diff --git a/tests/registry.rs b/tests/registry.rs

index 325f42711513a5afb39d406a72a48cb65689d6d0..b4d47358248fe2078008e6c92137363663110830 100644 (file)
--- a/tests/registry.rs
+++ b/tests/registry.rs
@@ -171,9 +171,6 @@ fn bad_cksum() {
  Caused by:
    failed to download replaced source `registry https://[..]`
  
-Caused by:
-  failed to download package `bad-cksum v0.0.1 (registry file://[..])` from [..]
-
  Caused by:
    failed to verify the checksum of `bad-cksum v0.0.1 (registry file://[..])`
  "));
author	Alex Crichton <alex@alexcrichton.com>
	Fri, 5 Feb 2016 23:11:07 +0000 (15:11 -0800)
committer	Alex Crichton <alex@alexcrichton.com>
	Mon, 1 Aug 2016 17:14:52 +0000 (10:14 -0700)
src/bin/login.rs		patch \| blob \| history
src/cargo/core/source.rs		patch \| blob \| history
src/cargo/ops/registry.rs		patch \| blob \| history
src/cargo/sources/registry.rs	[deleted file]	patch \| blob \| history
src/cargo/sources/registry/index.rs	[new file with mode: 0644]	patch \| blob
src/cargo/sources/registry/mod.rs	[new file with mode: 0644]	patch \| blob
src/cargo/sources/registry/remote.rs	[new file with mode: 0644]	patch \| blob
tests/registry.rs		patch \| blob \| history